Expert(Sto) Return Avg: 3494.31, std: 9.77
array([3506.584, 3490.196, 3501.847, 3479.176, 3483.817, 3493.678,
       3490.362, 3502.376, 3512.96 , 3503.75 , 3480.46 , 3509.224,
       3493.809, 3489.614, 3501.114, 3507.032, 3487.71 , 3510.834,
       3501.506, 3512.044, 3493.558, 3503.494, 3507.378, 3506.112,
       3502.106, 3481.233, 3497.378, 3491.08 , 3494.132, 3488.929,
       3494.967, 3482.417, 3481.459, 3489.951, 3488.257, 3492.08 ,
       3484.725, 3502.682, 3499.977, 3493.042, 3514.677, 3495.574,
       3504.513, 3493.816, 3494.608, 3484.887, 3488.873, 3486.479,
       3487.311, 3497.588, 3492.103, 3482.593, 3479.339, 3489.158,
       3490.726, 3491.861, 3504.798, 3494.202, 3482.183, 3495.005,
       3492.167, 3495.345, 3502.05 , 3463.131])
Expert(Det) Return Avg: 3531.95, std: 2.86
array([3535.884, 3529.237, 3530.751, 3528.768, 3528.549, 3532.258,
       3532.473, 3531.301, 3532.498, 3535.534, 3527.91 , 3534.069,
       3529.424, 3528.349, 3530.316, 3536.745, 3533.737, 3531.831,
       3535.275, 3530.422, 3529.622, 3531.563, 3531.354, 3530.969,
       3536.419, 3534.388, 3531.933, 3531.529, 3530.359, 3531.278,
       3532.376, 3535.49 , 3532.482, 3534.111, 3537.271, 3527.931,
       3529.284, 3532.625, 3530.45 , 3526.306, 3528.79 , 3534.042,
       3531.406, 3530.488, 3531.094, 3532.037, 3530.345, 3531.444,
       3536.181, 3531.904, 3539.595, 3529.632, 3529.518, 3528.406,
       3531.092, 3538.592, 3535.655, 3533.768, 3533.968, 3524.786,
       3533.166, 3530.414, 3532.462, 3532.668])
ordereddict([('seed', 1), ('cuda', -1), ('env', ordereddict([('env_name', 'HopperFH-v0'), ('T', 1000)])), ('sac', ordereddict([('epochs', 1000), ('log_step_interval', 5000), ('update_every', 50), ('update_num', 1), ('random_explore_episodes', 10), ('batch_size', 100), ('lr', 0.001), ('alpha', 0.2), ('automatic_alpha_tuning', False), ('buffer_size', 1000000), ('num_test_episodes', 10)])), ('expert', ordereddict([('samples_episode', 64)]))])